{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "> 1. 城市： '北京、 '上海'、 '广州'、'深圳'\n",
    "> 2. 关键词：4A广告公司，广告策划，广告文案，行销策划\n",
    "> 3. 工作经验：'应届生'、 '实习生'、 '1年以内'、 '1-3年'、'3-5年'、 '5-10年'、'10年以上'\n",
    "> 4. 学历：本科及本科以上"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "登录cookie __gc_id=72ec0caa79ef4ee0bf7232d23b95a349; _ga=GA1.1.1375856594.1681904278; __uuid=1681904283335.17; __tlog=1701425302634.08%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; XSRF-TOKEN=HuFQfP6JRByGViwOkv9YhQ; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1701343478,1701425307; _ga_54YTJKWN86=GS1.1.1701440724.12.1.1701441044.0.0.0; __session_seq=8; __tlg_event_seq=61; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701441045\n",
      "这是第1页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第2页，接下来将先等待8秒...然后以继续抓取\n",
      "这是第3页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第4页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第5页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第6页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第7页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第8页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第9页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第10页，接下来将先等待3秒...然后以继续抓取\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>...</th>\n",
       "      <th>job.advViewFlag</th>\n",
       "      <th>job.dataPromId</th>\n",
       "      <th>recruiter.recruiterId</th>\n",
       "      <th>recruiter.chatted</th>\n",
       "      <th>recruiter.imId</th>\n",
       "      <th>recruiter.imUserType</th>\n",
       "      <th>recruiter.recruiterName</th>\n",
       "      <th>recruiter.recruiterTitle</th>\n",
       "      <th>recruiter.recruiterPhoto</th>\n",
       "      <th>comp.compStage</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>%7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"imId\":\"cd5d1ab00be1dd1855a0b65...</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>https://www.liepin.com/company/7887755/</td>\n",
       "      <td>北京志健金瑞生物医药科技有限公司</td>\n",
       "      <td>5bfe91b074719d35745ae12203a.png</td>\n",
       "      <td>7887755.0</td>\n",
       "      <td>制药</td>\n",
       "      <td>[文案策划, 品牌策划, 广告策划, 市场策划, 媒介策划, 活动策划, 新闻策划, 门户网...</td>\n",
       "      <td>15-20k</td>\n",
       "      <td>...</td>\n",
       "      <td>True</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>e125ab15a243fadf9db142f8a7c198c4</td>\n",
       "      <td>False</td>\n",
       "      <td>cd5d1ab00be1dd1855a0b6511a508218</td>\n",
       "      <td>2</td>\n",
       "      <td>兰女士</td>\n",
       "      <td>人事</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>%7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"imId\":\"4b20c0c650c528b9ee7b65a...</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>https://www.liepin.com/company/9902859/</td>\n",
       "      <td>爱迪特(秦皇岛)科技股份有限公司</td>\n",
       "      <td>5d0c6510501544662ca346b306u.jpg</td>\n",
       "      <td>9902859.0</td>\n",
       "      <td>机械/制造</td>\n",
       "      <td>[客户管理, 销售管理]</td>\n",
       "      <td>12-24k</td>\n",
       "      <td>...</td>\n",
       "      <td>True</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>8e835b7fa013a333c720b79d71ff1742</td>\n",
       "      <td>False</td>\n",
       "      <td>4b20c0c650c528b9ee7b65a82243fe9b</td>\n",
       "      <td>2</td>\n",
       "      <td>钟先生</td>\n",
       "      <td>招聘经理</td>\n",
       "      <td>63abf9999e48870356632a2906u.png</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>%7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"imId\":\"ce5ba37b5b3d556c7db9425...</td>\n",
       "      <td>1000-2000人</td>\n",
       "      <td>https://www.liepin.com/company/7921271/</td>\n",
       "      <td>小红书</td>\n",
       "      <td>5952248270327b30a4cc59d605a.jpg</td>\n",
       "      <td>7921271.0</td>\n",
       "      <td>互联网</td>\n",
       "      <td>[商家运营, 达人运营, KOL运营]</td>\n",
       "      <td>20-35k·16薪</td>\n",
       "      <td>...</td>\n",
       "      <td>True</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>be838138b1ab03fc2487db4d7a2a8bd6</td>\n",
       "      <td>False</td>\n",
       "      <td>ce5ba37b5b3d556c7db94255d9736b5c</td>\n",
       "      <td>2</td>\n",
       "      <td>齐女士</td>\n",
       "      <td>HR</td>\n",
       "      <td>658b85aebe7c312375eaaf4a03u.jpg</td>\n",
       "      <td>D轮</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>%7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...</td>\n",
       "      <td>{\"jobKind\":\"1\",\"imId\":\"c0da9fe6904832c14a7a04e...</td>\n",
       "      <td>50-99人</td>\n",
       "      <td></td>\n",
       "      <td>某深圳计算机软件公司</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>[广告投放, 信息流投放, 电商平台投放, 搜索引擎投放, 广告数据分析, 投放策略, 数据...</td>\n",
       "      <td>25-35k·14薪</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>b93daebfdc21e2d66442dceb2069d7e2</td>\n",
       "      <td>False</td>\n",
       "      <td>c0da9fe6904832c14a7a04e7d95591ea</td>\n",
       "      <td>2</td>\n",
       "      <td>魏先生</td>\n",
       "      <td>猎头顾问</td>\n",
       "      <td>642395e88177f553788841e308u.jpeg</td>\n",
       "      <td>融资未公开</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>%7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...</td>\n",
       "      <td>{\"jobKind\":\"1\",\"imId\":\"36bcd620cdbc0b3667766a0...</td>\n",
       "      <td>50-99人</td>\n",
       "      <td></td>\n",
       "      <td>某深圳计算机软件公司</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>[数据分析, 账户管理, 活动策划, 市场营销, 信息流, 广告/传媒/文化]</td>\n",
       "      <td>20-30k</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>d7a0b5ff5b5cff5b90461569440a971e</td>\n",
       "      <td>False</td>\n",
       "      <td>36bcd620cdbc0b3667766a03c68ce883</td>\n",
       "      <td>2</td>\n",
       "      <td>何女士</td>\n",
       "      <td>猎头顾问</td>\n",
       "      <td>6574063d1a900b7e85cf540507u.png</td>\n",
       "      <td>融资未公开</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...</td>\n",
       "      <td>{\"imId\":\"773f6a3cc120f016882b84a174d57208\",\"im...</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>https://www.liepin.com/company/12147243/</td>\n",
       "      <td>深圳库犸科技有限公司</td>\n",
       "      <td>65827eace0ce0251c2afdf5305u.png</td>\n",
       "      <td>12147243.0</td>\n",
       "      <td>智能硬件</td>\n",
       "      <td>[]</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=9&amp;d...</td>\n",
       "      <td>4f2f3a52b9be1b3533602513f20e346d</td>\n",
       "      <td>False</td>\n",
       "      <td>773f6a3cc120f016882b84a174d57208</td>\n",
       "      <td>2</td>\n",
       "      <td>刘女士</td>\n",
       "      <td>招聘主管</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>B轮</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...</td>\n",
       "      <td>{\"imId\":\"ee291532b4048c4e9ccf3dc45f6d7696\",\"im...</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>https://www.liepin.com/company/2020322/</td>\n",
       "      <td>唯品会(中国)</td>\n",
       "      <td>5d3f908a81fb1a0d6f60102105u.jpg</td>\n",
       "      <td>2020322.0</td>\n",
       "      <td>互联网</td>\n",
       "      <td>[策略运营, 电子商务, 广告投放/流量运营, 电商平台]</td>\n",
       "      <td>14-18k·14薪</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=9&amp;d...</td>\n",
       "      <td>bd976580a86cfa8643e05c5b8e40d663</td>\n",
       "      <td>False</td>\n",
       "      <td>ee291532b4048c4e9ccf3dc45f6d7696</td>\n",
       "      <td>2</td>\n",
       "      <td>董女士</td>\n",
       "      <td>HRBP经理</td>\n",
       "      <td>5f8f9863f6d1ab58476f246a08u.jpg</td>\n",
       "      <td>美股上市</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...</td>\n",
       "      <td>{\"imId\":\"59bcbcdae6c751c19b730e23f2bd8f83\",\"im...</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>https://www.liepin.com/company/7983148/</td>\n",
       "      <td>腾讯</td>\n",
       "      <td>5bfe919474719d35745adb7903a.png</td>\n",
       "      <td>7983148.0</td>\n",
       "      <td>互联网</td>\n",
       "      <td>[策略运营]</td>\n",
       "      <td>30-60k·16薪</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=9&amp;d...</td>\n",
       "      <td>9b9df35600ba60d4892cd874fa48e31c</td>\n",
       "      <td>False</td>\n",
       "      <td>59bcbcdae6c751c19b730e23f2bd8f83</td>\n",
       "      <td>2</td>\n",
       "      <td>彭先生</td>\n",
       "      <td>HR</td>\n",
       "      <td>5f8f9868f6d1ab58476f24a008u.jpg</td>\n",
       "      <td>已上市</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...</td>\n",
       "      <td>{\"imId\":\"7913ac1ddf605cb7fb8879f236822d2d\",\"im...</td>\n",
       "      <td>50-99人</td>\n",
       "      <td></td>\n",
       "      <td>某国内电子商务公司</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>电子商务</td>\n",
       "      <td>[家居卫浴, 谷歌投放, Google, GA分析]</td>\n",
       "      <td>20-30k·18薪</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=9&amp;d...</td>\n",
       "      <td>f66f0f88dfbdd9b92ae959d80ebadea7</td>\n",
       "      <td>False</td>\n",
       "      <td>7913ac1ddf605cb7fb8879f236822d2d</td>\n",
       "      <td>2</td>\n",
       "      <td>张先生</td>\n",
       "      <td>猎头顾问</td>\n",
       "      <td>63e4b365b9753a51527de75d03u.png</td>\n",
       "      <td>不需要融资</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...</td>\n",
       "      <td>{\"imId\":\"76f0e5912d8a29d8f4067025f1d6ce6f\",\"im...</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>https://www.liepin.com/company/1840913/</td>\n",
       "      <td>盛天网络</td>\n",
       "      <td>5d50c292cd394174d09ab1f304u.png</td>\n",
       "      <td>1840913.0</td>\n",
       "      <td>互联网</td>\n",
       "      <td>[]</td>\n",
       "      <td>10-15k·14薪</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=9&amp;d...</td>\n",
       "      <td>91069ed2791a3b1902d5f3cfa4e3163b</td>\n",
       "      <td>False</td>\n",
       "      <td>76f0e5912d8a29d8f4067025f1d6ce6f</td>\n",
       "      <td>2</td>\n",
       "      <td>师先生</td>\n",
       "      <td></td>\n",
       "      <td>5f8f986c79c7cc70efbf36c808u.jpg</td>\n",
       "      <td>创业板上市</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>400 rows × 31 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                             dataInfo  \\\n",
       "0   %7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...   \n",
       "1   %7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...   \n",
       "2   %7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...   \n",
       "3   %7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...   \n",
       "4   %7B%22ckId%22%3A%22y2jy1uvl2gar8xipyemg77rijoo...   \n",
       "..                                                ...   \n",
       "35  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...   \n",
       "36  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...   \n",
       "37  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...   \n",
       "38  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...   \n",
       "39  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22d_cu...   \n",
       "\n",
       "                                           dataParams comp.compScale  \\\n",
       "0   {\"jobKind\":\"2\",\"imId\":\"cd5d1ab00be1dd1855a0b65...          1-49人   \n",
       "1   {\"jobKind\":\"2\",\"imId\":\"4b20c0c650c528b9ee7b65a...       500-999人   \n",
       "2   {\"jobKind\":\"2\",\"imId\":\"ce5ba37b5b3d556c7db9425...     1000-2000人   \n",
       "3   {\"jobKind\":\"1\",\"imId\":\"c0da9fe6904832c14a7a04e...         50-99人   \n",
       "4   {\"jobKind\":\"1\",\"imId\":\"36bcd620cdbc0b3667766a0...         50-99人   \n",
       "..                                                ...            ...   \n",
       "35  {\"imId\":\"773f6a3cc120f016882b84a174d57208\",\"im...       100-499人   \n",
       "36  {\"imId\":\"ee291532b4048c4e9ccf3dc45f6d7696\",\"im...       10000人以上   \n",
       "37  {\"imId\":\"59bcbcdae6c751c19b730e23f2bd8f83\",\"im...       10000人以上   \n",
       "38  {\"imId\":\"7913ac1ddf605cb7fb8879f236822d2d\",\"im...         50-99人   \n",
       "39  {\"imId\":\"76f0e5912d8a29d8f4067025f1d6ce6f\",\"im...       500-999人   \n",
       "\n",
       "                                   comp.link     comp.compName  \\\n",
       "0    https://www.liepin.com/company/7887755/  北京志健金瑞生物医药科技有限公司   \n",
       "1    https://www.liepin.com/company/9902859/  爱迪特(秦皇岛)科技股份有限公司   \n",
       "2    https://www.liepin.com/company/7921271/               小红书   \n",
       "3                                                   某深圳计算机软件公司   \n",
       "4                                                   某深圳计算机软件公司   \n",
       "..                                       ...               ...   \n",
       "35  https://www.liepin.com/company/12147243/        深圳库犸科技有限公司   \n",
       "36   https://www.liepin.com/company/2020322/           唯品会(中国)   \n",
       "37   https://www.liepin.com/company/7983148/                腾讯   \n",
       "38                                                   某国内电子商务公司   \n",
       "39   https://www.liepin.com/company/1840913/              盛天网络   \n",
       "\n",
       "                      comp.compLogo  comp.compId comp.compIndustry  \\\n",
       "0   5bfe91b074719d35745ae12203a.png    7887755.0                制药   \n",
       "1   5d0c6510501544662ca346b306u.jpg    9902859.0             机械/制造   \n",
       "2   5952248270327b30a4cc59d605a.jpg    7921271.0               互联网   \n",
       "3   60e2fe0bf3df194a3c48adb502u.png          NaN             计算机软件   \n",
       "4   60e2fe0bf3df194a3c48adb502u.png          NaN             计算机软件   \n",
       "..                              ...          ...               ...   \n",
       "35  65827eace0ce0251c2afdf5305u.png   12147243.0              智能硬件   \n",
       "36  5d3f908a81fb1a0d6f60102105u.jpg    2020322.0               互联网   \n",
       "37  5bfe919474719d35745adb7903a.png    7983148.0               互联网   \n",
       "38  60e2fe0bf3df194a3c48adb502u.png          NaN              电子商务   \n",
       "39  5d50c292cd394174d09ab1f304u.png    1840913.0               互联网   \n",
       "\n",
       "                                           job.labels  job.salary  ...  \\\n",
       "0   [文案策划, 品牌策划, 广告策划, 市场策划, 媒介策划, 活动策划, 新闻策划, 门户网...      15-20k  ...   \n",
       "1                                        [客户管理, 销售管理]      12-24k  ...   \n",
       "2                                 [商家运营, 达人运营, KOL运营]  20-35k·16薪  ...   \n",
       "3   [广告投放, 信息流投放, 电商平台投放, 搜索引擎投放, 广告数据分析, 投放策略, 数据...  25-35k·14薪  ...   \n",
       "4             [数据分析, 账户管理, 活动策划, 市场营销, 信息流, 广告/传媒/文化]      20-30k  ...   \n",
       "..                                                ...         ...  ...   \n",
       "35                                                 []      20-35k  ...   \n",
       "36                      [策略运营, 电子商务, 广告投放/流量运营, 电商平台]  14-18k·14薪  ...   \n",
       "37                                             [策略运营]  30-60k·16薪  ...   \n",
       "38                         [家居卫浴, 谷歌投放, Google, GA分析]  20-30k·18薪  ...   \n",
       "39                                                 []  10-15k·14薪  ...   \n",
       "\n",
       "   job.advViewFlag                                     job.dataPromId  \\\n",
       "0             True  d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...   \n",
       "1             True  d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...   \n",
       "2             True  d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...   \n",
       "3            False  d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...   \n",
       "4            False  d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...   \n",
       "..             ...                                                ...   \n",
       "35           False  d_sfrom=search_prime&d_ckId=null&d_curPage=9&d...   \n",
       "36           False  d_sfrom=search_prime&d_ckId=null&d_curPage=9&d...   \n",
       "37           False  d_sfrom=search_prime&d_ckId=null&d_curPage=9&d...   \n",
       "38           False  d_sfrom=search_prime&d_ckId=null&d_curPage=9&d...   \n",
       "39           False  d_sfrom=search_prime&d_ckId=null&d_curPage=9&d...   \n",
       "\n",
       "               recruiter.recruiterId recruiter.chatted  \\\n",
       "0   e125ab15a243fadf9db142f8a7c198c4             False   \n",
       "1   8e835b7fa013a333c720b79d71ff1742             False   \n",
       "2   be838138b1ab03fc2487db4d7a2a8bd6             False   \n",
       "3   b93daebfdc21e2d66442dceb2069d7e2             False   \n",
       "4   d7a0b5ff5b5cff5b90461569440a971e             False   \n",
       "..                               ...               ...   \n",
       "35  4f2f3a52b9be1b3533602513f20e346d             False   \n",
       "36  bd976580a86cfa8643e05c5b8e40d663             False   \n",
       "37  9b9df35600ba60d4892cd874fa48e31c             False   \n",
       "38  f66f0f88dfbdd9b92ae959d80ebadea7             False   \n",
       "39  91069ed2791a3b1902d5f3cfa4e3163b             False   \n",
       "\n",
       "                      recruiter.imId recruiter.imUserType  \\\n",
       "0   cd5d1ab00be1dd1855a0b6511a508218                    2   \n",
       "1   4b20c0c650c528b9ee7b65a82243fe9b                    2   \n",
       "2   ce5ba37b5b3d556c7db94255d9736b5c                    2   \n",
       "3   c0da9fe6904832c14a7a04e7d95591ea                    2   \n",
       "4   36bcd620cdbc0b3667766a03c68ce883                    2   \n",
       "..                               ...                  ...   \n",
       "35  773f6a3cc120f016882b84a174d57208                    2   \n",
       "36  ee291532b4048c4e9ccf3dc45f6d7696                    2   \n",
       "37  59bcbcdae6c751c19b730e23f2bd8f83                    2   \n",
       "38  7913ac1ddf605cb7fb8879f236822d2d                    2   \n",
       "39  76f0e5912d8a29d8f4067025f1d6ce6f                    2   \n",
       "\n",
       "   recruiter.recruiterName recruiter.recruiterTitle  \\\n",
       "0                      兰女士                       人事   \n",
       "1                      钟先生                     招聘经理   \n",
       "2                      齐女士                       HR   \n",
       "3                      魏先生                     猎头顾问   \n",
       "4                      何女士                     猎头顾问   \n",
       "..                     ...                      ...   \n",
       "35                     刘女士                     招聘主管   \n",
       "36                     董女士                   HRBP经理   \n",
       "37                     彭先生                       HR   \n",
       "38                     张先生                     猎头顾问   \n",
       "39                     师先生                            \n",
       "\n",
       "            recruiter.recruiterPhoto comp.compStage  \n",
       "0    5f8f9866dfb13a7dee342f1808u.jpg            NaN  \n",
       "1    63abf9999e48870356632a2906u.png            NaN  \n",
       "2    658b85aebe7c312375eaaf4a03u.jpg             D轮  \n",
       "3   642395e88177f553788841e308u.jpeg          融资未公开  \n",
       "4    6574063d1a900b7e85cf540507u.png          融资未公开  \n",
       "..                               ...            ...  \n",
       "35   5f8f9865ea60860b75384fa508u.jpg             B轮  \n",
       "36   5f8f9863f6d1ab58476f246a08u.jpg           美股上市  \n",
       "37   5f8f9868f6d1ab58476f24a008u.jpg            已上市  \n",
       "38   63e4b365b9753a51527de75d03u.png          不需要融资  \n",
       "39   5f8f986c79c7cc70efbf36c808u.jpg          创业板上市  \n",
       "\n",
       "[400 rows x 31 columns]"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import crawl_liepin\n",
    "\n",
    "crawl_liepin.crawl(城市=\"深圳\",关键词=\"广告\",学历='本科',工作经验='')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# cookies实现登陆，获取完整数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'__gc_id=72ec0caa79ef4ee0bf7232d23b95a349; _ga=GA1.1.1375856594.1681904278; __uuid=1681904283335.17; __tlog=1701425302634.08%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; XSRF-TOKEN=HuFQfP6JRByGViwOkv9YhQ; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1701343478,1701425307; _ga_54YTJKWN86=GS1.1.1701440724.12.1.1701441044.0.0.0; __session_seq=8; __tlg_event_seq=61; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701441045'"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 建立登陆cookie\n",
    "cookie = \"__gc_id=72ec0caa79ef4ee0bf7232d23b95a349; _ga=GA1.1.1375856594.1681904278; __uuid=1681904283335.17; __tlog=1701425302634.08%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; XSRF-TOKEN=HuFQfP6JRByGViwOkv9YhQ; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1701343478,1701425307; _ga_54YTJKWN86=GS1.1.1701440724.12.1.1701441044.0.0.0; __session_seq=8; __tlg_event_seq=61; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701441045\"\n",
    "cookie"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "登录cookie __gc_id=72ec0caa79ef4ee0bf7232d23b95a349; _ga=GA1.1.1375856594.1681904278; __uuid=1681904283335.17; __tlog=1701425302634.08%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; XSRF-TOKEN=HuFQfP6JRByGViwOkv9YhQ; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1701343478,1701425307; _ga_54YTJKWN86=GS1.1.1701440724.12.1.1701441044.0.0.0; __session_seq=8; __tlg_event_seq=61; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701441045\n",
      "这是第1页，接下来将先等待8秒...然后以继续抓取\n",
      "这是第2页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第3页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第4页，接下来将先等待8秒...然后以继续抓取\n",
      "这是第5页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第6页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第7页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第8页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第9页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第10页，接下来将先等待4秒...然后以继续抓取\n"
     ]
    }
   ],
   "source": [
    "import crawl_liepin\n",
    "\n",
    "广告_深圳_results = crawl_liepin.crawl(城市=\"深圳\",关键词=\"广告\",学历='本科',工作经验='',登录cookie=cookie)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "广告_深圳_results= 广告_深圳_results.rename(columns={\n",
    "        'job.labels':'职位标签',\n",
    "        'job.refreshTime':'职位更新时间',\n",
    "        'job.title':'职位',\n",
    "        'job.salary':'薪资',\n",
    "        'job.dq':'地区',\n",
    "        'job.topJob':'是否top职位',\n",
    "        'job.link':'链接',\n",
    "        'job.requireEduLevel':'学历要求',\n",
    "        'job.requireWorkYears':'工作经验',\n",
    "        'comp.compStage':'公司融资情况',\n",
    "        'comp.compName':'公司名称',\n",
    "        'comp.compIndustry':'行业',\n",
    "        'comp.compScale':'规模', \n",
    "        'recruiter.recruiterName':'HR' \n",
    "    \n",
    "})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "广告_深圳_results.to_excel(\"广告_深圳_results.xlsx\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.0"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
